@InProceedings{cherry-guo:2015:NAACL-HLT,
  author    = {Cherry, Colin  and  Guo, Hongyu},
  title     = {The Unreasonable Effectiveness of Word Representations for Twitter Named Entity Recognition},
  booktitle = {Proceedings of the 2015 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies},
  month     = {May--June},
  year      = {2015},
  address   = {Denver, Colorado},
  publisher = {Association for Computational Linguistics},
  pages     = {735--745},
  url       = {http://www.aclweb.org/anthology/N15-1075}
}

@InProceedings{gupta-manning:2015:NAACL-HLT,
  author    = {Gupta, Sonal  and  Manning, Christopher D.},
  title     = {Distributed Representations of Words to Guide Bootstrapped Entity Classifiers},
  booktitle = {Proceedings of the 2015 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies},
  month     = {May--June},
  year      = {2015},
  address   = {Denver, Colorado},
  publisher = {Association for Computational Linguistics},
  pages     = {1215--1220},
  url       = {http://www.aclweb.org/anthology/N15-1128}
}



@TECHREPORT{Thrun95lifelonglearning,
    author = {Sebastian Thrun},
    title = {Lifelong Learning: A Case Study},
    institution = {},
    year = {1995}
}

@INPROCEEDINGS{Thrun:96,
    author = {Sebastian Thrun},
    title = {Is Learning The n-th Thing Any Easier Than Learning The First?},
    booktitle = {Advances in Neural Information Processing Systems},
    year = {1996},
    pages = {640--646},
    publisher = {The MIT Press}
}


@INPROCEEDINGS{Baxter:97,
    author = {Jonathan Baxter},
    title = {A Bayesian/information theoretic model of learning to learn via multiple task sampling},
    booktitle = {Machine Learning},
    year = {1997},
    pages = {7--39}
}

@inproceedings{Arnold:07,
 author = {Arnold, Andrew and Nallapati, Ramesh and Cohen, William W.},
 title = {A Comparative Study of Methods for Transductive Transfer Learning},
 booktitle = {Proceedings of the Seventh IEEE International Conference on Data Mining Workshops},
 series = {ICDMW '07},
 year = {2007},
 isbn = {0-7695-3033-8},
 pages = {77--82},
 numpages = {6},
 acmid = {1336050},
 publisher = {IEEE Computer Society},
 address = {Washington, DC, USA}
} 

@INPROCEEDINGS{Arnold:08,
  author = {Arnold, Andrew and Nallapati, Ramesh and Cohen, William W.},
  booktitle = {ACL},
  editor = {McKeown, Kathleen and Moore, Johanna D. and Teufel, Simone and Allan, James and Furui, Sadaoki},
  isbn = {978-1-932432-04-6},
  pages = {245-253},
  publisher = {The Association for Computer Linguistics},
  title = {Exploiting Feature Hierarchy for Transfer Learning in Named Entity Recognition.},
  year = {2008}
}


@inproceedings{Chelba:04,
  author    = {Chelba, Ciprian  and  Acero, Alex},
  title     = {Adaptation of Maximum Entropy Capitalizer: Little Data Can Help a Lot},
  booktitle = {Proceedings of EMNLP 2004},
  editor = {Dekang Lin and Dekai Wu},
  year      = 2004,
  month     = {July},
  address   = {Barcelona, Spain},
  publisher = {Association for Computational Linguistics},
  pages     = {285--292}
}

@inproceedings{Sutton:05,
 author = {Sutton, Charles and McCallum, Andrew},
 title = {Composition of Conditional Random Fields for Transfer Learning},
 booktitle = {Proceedings of the Conference on Human Language Technology and Empirical Methods in Natural Language Processing},
 series = {HLT '05},
 year = {2005},
 location = {Vancouver, British Columbia, Canada},
 pages = {748--754},
 numpages = {7},
 url = {http://dx.doi.org/10.3115/1220575.1220669},
 doi = {10.3115/1220575.1220669},
 acmid = {1220669},
 publisher = {Association for Computational Linguistics},
 address = {Stroudsburg, PA, USA}
} 

@INPROCEEDINGS{Florian:04,
    author = {R. Florian and H. Hassan and A. Ittycheriah and H. Jing and N. Kambhatla and X. Luo and N. Nicolov and S. Roukos},
    title = {A statistical model for multilingual entity detection and tracking},
    booktitle = {In NAACL/HLT},
    year = {2004},
    pages = {1--8}
}


@article{Caruana:97,
 author = {Caruana, Rich},
 title = {Multitask Learning},
 journal = {Mach. Learn.},
 issue_date = {July 1997},
 volume = {28},
 number = {1},
 month = jul,
 year = {1997},
 issn = {0885-6125},
 pages = {41--75},
 numpages = {35},
 url = {http://dx.doi.org/10.1023/A:1007379606734},
 doi = {10.1023/A:1007379606734},
 acmid = {262872},
 publisher = {Kluwer Academic Publishers},
 address = {Hingham, MA, USA},
 keywords = {backpropagation, generalization, inductive transfer, k-nearest neighbor, kernel regression, multitask learning, parallel transfer, supervised learning}
} 


@inproceedings{Kim:2002,
 author = {Kim, Jae-Ho and Kang, In-Ho and Choi, Key-Sun},
 title = {Unsupervised Named Entity Classification Models and Their Ensembles},
 booktitle = {Proceedings of the 19th International Conference on Computational Linguistics - Volume 1},
 series = {COLING '02},
 year = {2002},
 location = {Taipei, Taiwan},
 pages = {1--7},
 numpages = {7},
 url = {http://dx.doi.org/10.3115/1072228.1072316},
 doi = {10.3115/1072228.1072316},
 acmid = {1072316},
 publisher = {Association for Computational Linguistics},
 address = {Stroudsburg, PA, USA}
} 

@inproceedings{TjongKimSang:2002,
 author = {Tjong Kim Sang, Erik F.},
 title = {Introduction to the CoNLL-2002 Shared Task: Language-independent Named Entity Recognition},
 booktitle = {Proceedings of the 6th Conference on Natural Language Learning - Volume 20},
 series = {COLING-02},
 year = {2002},
 pages = {1--4},
 numpages = {4},
 url = {http://dx.doi.org/10.3115/1118853.1118877},
 doi = {10.3115/1118853.1118877},
 acmid = {1118877},
 publisher = {Association for Computational Linguistics},
 address = {Stroudsburg, PA, USA}
} 

@INPROCEEDINGS{Collins:99,
    author = {Michael Collins and Yoram Singer},
    title = {Unsupervised Models for Named Entity Classification},
    booktitle = {In Proceedings of the Joint SIGDAT Conference on Empirical Methods in Natural Language Processing and Very Large Corpora},
    year = {1999},
    pages = {100--110}
}


@inproceedings{Liao:2009,
 author = {Liao, Wenhui and Veeramachaneni, Sriharsha},
 title = {A Simple Semi-supervised Algorithm for Named Entity Recognition},
 booktitle = {Proceedings of the NAACL HLT 2009 Workshop on Semi-Supervised Learning for Natural Language Processing},
 series = {SemiSupLearn '09},
 year = {2009},
 isbn = {978-1-932432-38-1},
 location = {Boulder, Colorado},
 pages = {58--65},
 numpages = {8},
 url = {http://dl.acm.org/citation.cfm?id=1621829.1621837},
 acmid = {1621837},
 publisher = {Association for Computational Linguistics},
 address = {Stroudsburg, PA, USA}
} 


@InProceedings{TjongKimSang:Buchholz:2000,
  author =	{Erik F. {Tjong Kim Sang} and Sabine Buchholz},
  title =	 {Introduction to the {CoNLL-2000} Shared Task:                   Chunking},
  booktitle = {CoNLL2000},
  year =	 {2000},
  address =	 {Lisbon, Portugal}
}

@article {abacha:2011,
	title = {Medical entity recognition: a comparison of semantic and statistical methods},
	journal = {ACL HLT 2011},
	year = {2011},
	pages = {56},
	keywords = {i2b2 2010 challenge corpus, LIMSI-CNRS, MetaMap, Named entity extraction, Noun phrase chunking},
	author = {Abacha, A.B. and Zweigenbaum, P.}
}


@InProceedings{jiang:2007,
  author    = {Jiang, Jing  and  Zhai, ChengXiang},
  title     = {Instance Weighting for Domain Adaptation in \uppercase{NLP}},
  booktitle = {Proceedings of the 45th Annual Meeting of the Association of Computational Linguistics},
  month     = {June},
  year      = {2007},
  address   = {Prague, Czech Republic},
  publisher = {Association for Computational Linguistics},
  pages     = {264--271},
  url       = {http://www.aclweb.org/anthology/P07-1034}
}

@InProceedings{daumeiii:2007:ACLMain,
  author    = {Daume III, Hal},
  title     = {Frustratingly Easy Domain Adaptation},
  booktitle = {Proceedings of the 45th Annual Meeting of the Association of Computational Linguistics},
  month     = {June},
  year      = {2007},
  address   = {Prague, Czech Republic},
  publisher = {Association for Computational Linguistics},
  pages     = {256--263},
  url       = {http://www.aclweb.org/anthology/P07-1033}
}

@InProceedings{richman-schone:2008:ACLMain,
  author    = {Richman, Alexander E.  and  Schone, Patrick},
  title     = {Mining Wiki Resources for Multilingual Named Entity Recognition},
  booktitle = {Proceedings of ACL-08: HLT},
  month     = {June},
  year      = {2008},
  address   = {Columbus, Ohio},
  publisher = {Association for Computational Linguistics},
  pages     = {1--9},
  url       = {http://www.aclweb.org/anthology/P/P08/P08-1001}
}

@inproceedings{Collobert08,
  author    = {Ronan Collobert and
               Jason Weston},
  title     = {A unified architecture for natural language processing: deep neural
               networks with multitask learning},
  booktitle = {Machine Learning, Proceedings of the Twenty-Fifth International Conference
               {(ICML} 2008), Helsinki, Finland, June 5-9, 2008},
  pages     = {160--167},
  year      = {2008},
  crossref  = {DBLP:conf/icml/2008},
  url       = {http://doi.acm.org/10.1145/1390156.1390177},
  doi       = {10.1145/1390156.1390177},
  timestamp = {Thu, 14 Aug 2008 13:58:39 +0200},
  biburl    = {http://dblp.uni-trier.de/rec/bib/conf/icml/CollobertW08},
  bibsource = {dblp computer science bibliography, http://dblp.org}
}

@incollection{Yosinski:2014,
title = {How transferable are features in deep neural networks?},
author = {Yosinski, Jason and Clune, Jeff and Bengio, Yoshua and Lipson, Hod},
booktitle = {Advances in Neural Information Processing Systems 27},
editor = {Z. Ghahramani and M. Welling and C. Cortes and N.D. Lawrence and K.Q. Weinberger},
pages = {3320--3328},
year = {2014},
publisher = {Curran Associates, Inc.},
url = {http://papers.nips.cc/paper/5347-how-transferable-are-features-in-deep-neural-networks.pdf}
}

@INPROCEEDINGS{Maynard:01,
    author = {Diana Maynard and Valentin Tablan and Cristian Ursu and Hamish Cunningham and Yorick Wilks},
    title = {Named Entity Recognition from Diverse Text Types},
    booktitle = {In Recent Advances in Natural Language Processing 2001 Conference, Tzigov Chark},
    year = {2001}
}

@article {Nadeau:2007,
author = {Nadeau, David and Sekine, Satoshi},
title = {A survey of named entity recognition and classification},
journal = {Lingvisticae Investigationes},
volume = {30},
number = {1},
year = {2007-01-01T00:00:00},
abstract = {This survey covers fifteen years of research in the Named Entity Recognition and Classification (NERC) field, from 1991 to 2006. We report observations about languages, named entity types, domains and textual genres studied in the literature. From the start, NERC systems have been developed using hand-made rules, but now machine learning techniques are widely used. These techniques are surveyed along with other critical aspects of NERC such as features and evaluation methods. Features are word-level, dictionary-level and corpus-level representations of words in a document. Evaluation techniques, ranging from intuitive exact match to very complex matching techniques with adjustable cost of errors, are an indisputable key to progress.},
pages = {3-26},
keyword = {EVALUATION, FEATURE SPACE, LEARNING METHOD, NAMED IDENTITY, SURVEY}
}



@INPROCEEDINGS{Chiticariu:2010,
 author = {Chiticariu, Laura and Krishnamurthy, Rajasekar and Li, Yunyao and Reiss, Frederick and Vaithyanathan, Shivakumar},
 title = {Domain Adaptation of Rule-based Annotators for Named-entity Recognition Tasks},
 booktitle = {Proceedings of the 2010 Conference on Empirical Methods in Natural Language Processing},
 series = {EMNLP '10},
 year = {2010},
 location = {Cambridge, Massachusetts},
 pages = {1002--1012},
 numpages = {11},
 url = {http://dl.acm.org/citation.cfm?id=1870658.1870756},
 publisher = {Association for Computational Linguistics},
 address = {Stroudsburg, PA, USA},
} 



